Assignment No. 2 


Programming for Big Data 


Question No. 1: 


import pandas as pd 

a = [(21,5,34,17,3,29,4,65] 

b = [2,34,11,7,35,9,17,4] 
myvar1=pd.Series(a) 

myvar2=pd.Series(b) 
resultl=myvar1[~myvar1.isin(myvar2)] 
result2=myvar2[~myvar2.isin(myvar1)] 
result1 = pd.concat([{result1, result2], axis=0) 
print(result1) 


Question No. 2: 


import pandas as pd 
data = { 
'year': [2010, 2005, 2010, 2020, 2010, 2005, 2005, 2020], 
‘model: ['Citigo', ‘Fabia’, 'Fiesta', 'Rapid', 'Focus', 'Mondeo’, ‘Octavia’, 'B-Max’'], 
‘car’: ['Skoda’, ‘Skoda’, 'Ford', 'Skoda’, 'Ford', 'Ford', ‘Skoda’, 'Ford'] 
} 
df = pd.DataFrame(data) 
#For the Cars Column 
new_df = df.groupby("car" 
#For all Groups 
for x,y in new_df: 
print(x) 
print(y) 
print() #for extra Space 
#For single group 
print(new_df.get_group("Ford")) 
#for years Columns 
new_df = df.groupby("year") 
#For all Groups 
for x,y in new_df: 
print(x) 
print(y) 
print() #Extra Space 
#For single group 
print(new_df.get_group(2010)) 


